# -*- coding: utf-8 -*-
import pandas as pd

# 导出的时间格式
LOG_TIME_FORMAT = '%Y%m%d'


def preprocessing(file_path: str, column_names: list) -> pd.DataFrame:
    """
    ## preprocessing\n
    Preprocess the file data in `file_path`
    :param file_path: CSV file path
    :param column_names: Column names you want to keep
    :return: Processed data
    """
    data = pd.read_csv(file_path)
    # 数据预处理, 提取有用字样
    data = data[column_names]
    return data
